Mul
对两个输入数据执行逐元素乘法运算。支持实数类型和复数类型。
\[\text{对于实数类型:}\quad output_i = input0_i \times input1_i\]
\[\text{对于复数类型:}\quad (a+bi) \times (c+di) = (ac - bd) + (ad + bc)i\]
- 输入:
input0 - 第一个输入数据地址。
input1 - 第二个输入数据地址。
length - 计算长度(对于复数,指复数的个数)。
core_mask(int, 可选) - 核掩码(仅适用于共享存储版本)。
- 输出:
output - 计算结果地址。
- 支持平台:
FT78NEMT7004
备注
FT78NE 支持:int8 (i8), int16 (i16), int32 (i32), fp32 (fp), fp64 (dp), cplx64 (c64), cplx128 (c128)
MT7004 支持:int16 (i16), int32 (i32), fp16 (hp), fp32 (fp), cplx64 (c64)
复数类型(cplx64/cplx128)在内存中以实部、虚部交替存储,运算遵循复数乘法公式。
共享存储版本:
-
void i8_mul_s(int8_t *input0, int8_t *input1, int8_t *output, int length, int core_mask)
-
void i16_mul_s(int16_t *input0, int16_t *input1, int16_t *output, int length, int core_mask)
-
void i32_mul_s(int32_t *input0, int32_t *input1, int32_t *output, int length, int core_mask)
-
void hp_mul_s(half *input0, half *input1, half *output, int length, int core_mask)
-
void fp_mul_s(float *input0, float *input1, float *output, int length, int core_mask)
-
void dp_mul_s(double *input0, double *input1, double *output, int length, int core_mask)
-
void c64_mul_s(float *input0, float *input1, float *output, int length, int core_mask)
-
void c128_mul_s(double *input0, double *input1, double *output, int length, int core_mask)
C调用示例:
1// FT78NE 示例:复数类型 cplx64 共享存储多核计算 2#include <stdio.h> 3#include "78NE/utils.h" 4 5int main(int argc, char* argv[]) { 6 float *in0 = (float *)0xA0000000; // 输入0 (包含 real, imag) 7 float *in1 = (float *)0xA1000000; // 输入1 8 float *out = (float *)0xB0000000; // 输出 9 int num_complex = 480000; // 复数个数 10 int core_mask = 0xFF; 11 c64_mul_s(in0, in1, out, num_complex, core_mask); 12 return 0; 13}
私有存储版本:
-
void i8_mul_p(int8_t *input0, int8_t *input1, int8_t *output, int length)
-
void i16_mul_p(int16_t *input0, int16_t *input1, int16_t *output, int length)
-
void i32_mul_p(int32_t *input0, int32_t *input1, int32_t *output, int length)
-
void hp_mul_p(half *input0, half *input1, half *output, int length)
-
void fp_mul_p(float *input0, float *input1, float *output, int length)
-
void dp_mul_p(double *input0, double *input1, double *output, int length)
-
void c64_mul_p(float *input0, float *input1, float *output, int length)
-
void c128_mul_p(double *input0, double *input1, double *output, int length)
C调用示例:
1// MT7004 示例:fp16 (half) 类型私有存储单核计算 2#include <stdio.h> 3 4int main(int argc, char* argv[]) { 5 // 输入与输出均位于私有存储空间 6 half *in0 = (half *)0x10000000; 7 half *in1 = (half *)0x10001000; 8 half *out = (half *)0x10002000; 9 int length = 1024; 10 hp_mul_p(in0, in1, out, length); 11 return 0; 12}